[1]:
from ckg.graphdb_builder import builder_utils
[2]:
example_file = 'tmp/example_PXD022733.mzTab'
[4]:
data = builder_utils.parse_mztab_file(example_file)
[6]:
print(data.keys())
dict_keys(['MTD', 'PRT', 'PSM'])
[8]:
data['PRT'].head()
[8]:
accession | description | taxid | species | database | database_version | search_engine | best_search_engine_score[1] | search_engine_score[1]_ms_run[1] | search_engine_score[1]_ms_run[2] | ... | num_peptides_unique_ms_run[254] | num_peptides_unique_ms_run[255] | num_peptides_unique_ms_run[256] | num_peptides_unique_ms_run[257] | num_peptides_unique_ms_run[258] | num_peptides_unique_ms_run[259] | ambiguity_members | modifications | protein_coverage | opt_global_cv_MS:1002217_decoy_peptide | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | A0A075B6I9 | sp|A0A075B6I9|LV746_HUMAN Immunoglobulin lambd... | null | null | null | null | [MS, MS:1002337, Andromeda, 1.6.8.0] | 2.54172068110967 | null | null | ... | null | null | null | null | null | null | A0A075B6I9, P04211 | null | 0.137 | 0 |
1 | A0A075B6K5 | sp|A0A075B6K5|LV39_HUMAN Immunoglobulin lambda... | null | null | null | null | [MS, MS:1002337, Andromeda, 1.6.8.0] | 12.3898963082584 | null | null | ... | null | null | null | null | null | null | A0A075B6K5, P80748 | null | 0.139 | 0 |
2 | A0A075B6P5 | sp|A0A075B6P5|KV228_HUMAN Immunoglobulin kappa... | null | null | null | null | [MS, MS:1002337, Andromeda, 1.6.8.0] | 37.2781261617028 | null | null | ... | null | null | null | null | null | null | A0A075B6P5, A0A087WW87, P01615, P01614, A2NJV5... | null | 0.167 | 0 |
3 | A0A0C4DH67 | sp|A0A0C4DH67|KV108_HUMAN Immunoglobulin kappa... | null | null | null | null | [MS, MS:1002337, Andromeda, 1.6.8.0] | 2.75929244987718 | null | null | ... | null | null | null | null | null | null | A0A0C4DH67, A0A0C4DH69, A0A075B6S5 | null | 0.139 | 0 |
4 | A0A0A0MRZ8 | sp|A0A0A0MRZ8|KVD11_HUMAN Immunoglobulin kappa... | null | null | null | null | [MS, MS:1002337, Andromeda, 1.6.8.0] | 10.1196640910864 | null | null | ... | null | null | null | null | null | null | A0A0A0MRZ8, P04433 | null | 0.322 | 0 |
5 rows × 1048 columns